package com.zyf.chapter01.principle.LOD;

import com.zyf.chapter01.principle.LOD.utils.Html;

/**
 * 网页文档
 * 网页内容抽取、分词、索引都以 Document 作为处理对象
 * @author yifeng
 */
public class Document {
    private Html html;
    private String url;

    public Document(String url) {
        this.url = url;
        HtmlDownloader downloader = new HtmlDownloader();
        this.html = downloader.downloadHtml(url);
    }
    // ...
}
